
## various descriptive statistics can be calculated via this file. may not have much in it but this is where this type of stuff belongs

nameDF <- read.csv('debian_aliases.tsv', sep='\t', stringsAsFactors = FALSE, header = FALSE)
colnames(nameDF) <- c('alias', 'canonical.name')
head(nameDF)
length(unique(nameDF$canonical.name))

namelist <- cbind(nameDF$alias, nameDF$canonical.name)
length(unique(namelist))

length(nameDF$alias)
